diff --git a/model-00001-of-000163.safetensors b/model-00001-of-000163.safetensors index a50ecf7fa9f533ea250e63103ef7436dc733c6f8..4efcd05d7b258feb8585e2662bffffe3394a154d 100644 --- a/model-00001-of-000163.safetensors +++ b/model-00001-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0a53dcdd0939fc01ddbb6927ba46c09497f81efd42e9c3e62245776e66731890 -size 5234138288 +oid sha256:105a51896ad57fa98c800bc7ea7434b1451befe622c9a73c8d47c555baf33b24 +size 8609454256 diff --git a/model-00002-of-000163.safetensors b/model-00002-of-000163.safetensors index b5f30f1492a77f63d60e83c592baf38bf3701853..54b4685e3094b546346ac45a117bbe22b72ce231 100644 --- a/model-00002-of-000163.safetensors +++ b/model-00002-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:de179d950ad25cc4596e26792a1a06a80a46540acef3a9d004cc9940358f3e58 -size 4302381728 +oid sha256:c22106699da0c75391008f48c9cdd1571c47086f95eadcf2f94cfd246cd76c23 +size 8602553952 diff --git a/model-00003-of-000163.safetensors b/model-00003-of-000163.safetensors index e7c7e5625325aa61eb9e7a60232fb95ddb300cde..537b16b8c0e319d892b36b155da5f654ef6908b2 100644 --- a/model-00003-of-000163.safetensors +++ b/model-00003-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ac592467a2391b507296d568a87c6f02d41a1a3473f3bc6705fdafe91a7e84d9 -size 4302382136 +oid sha256:6146853dbbaebe46f7565a10fa49f1a93a305b743190afdc98a52fb65db1170d +size 8602554152 diff --git a/model-00004-of-000163.safetensors b/model-00004-of-000163.safetensors index 5f2dcadc215656ca1642252191e7a3decdee7af9..687645d58e05432ae4b87b7fef0fd8db051b964c 100644 --- a/model-00004-of-000163.safetensors +++ b/model-00004-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6e2c15bd1a0cc9b4da6e5faa5dd82a6e8322fdeef89ea76fa6556e086dac9201 -size 4302347768 +oid sha256:cf09a38a359be1a544393032a939e16c2844a661131839e68e87ebc446d62c5d +size 8598786296 diff --git a/model-00005-of-000163.safetensors b/model-00005-of-000163.safetensors index e7971b62a4bc5788cac37ccbaaeb9b7f89316e32..16d205079059f76a6277e77008234aee4b212bf1 100644 --- a/model-00005-of-000163.safetensors +++ b/model-00005-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d4cd762a7f2575c8a8fb04a68556e2311350567c9cb015fd94af7d37e5ef5c7d -size 4302381912 +oid sha256:aef838f18521784d33422dc974c8df081c216d3d4934f8c93ebc5b27ca4c41b8 +size 8602554048 diff --git a/model-00006-of-000163.safetensors b/model-00006-of-000163.safetensors index a3125b8f54b1c115ea30a1b7ac571a13477e5c9b..6ec351405e94a9c03d2b5f3eda25c0eb61a06408 100644 --- a/model-00006-of-000163.safetensors +++ b/model-00006-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d267c2a6d020ef9e6333f886a52aeba11518fc0e6a2a00261d5ccdff71670fe1 -size 4372071352 +oid sha256:7ed70dbd1eaa25f20d804742ffbff88ec0889641524cadd18fda4e7c9fe825bf +size 8741916520 diff --git a/model-00007-of-000163.safetensors b/model-00007-of-000163.safetensors index b7d038d3c2de443ea5afcef23e26ada1fb292102..3f0aa855606b7450f67189399ccc80fe2b206465 100644 --- a/model-00007-of-000163.safetensors +++ b/model-00007-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6f82b553017ac5b1962ffb68604935780a8699bd929d6a3170134f6dc2736aa0 -size 4306077848 +oid sha256:d0c75355f17df909cbbb3e5bc8ad5390fba9e314da61f8db3b5f46259a1df471 +size 8606225096 diff --git a/model-00008-of-000163.safetensors b/model-00008-of-000163.safetensors index 2ab3cf6864e27f1664600c2910916029d9215e51..57d4db5e19f1f867d16f17106a63f4624cd71d32 100644 --- a/model-00008-of-000163.safetensors +++ b/model-00008-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b8659a4124c5001e4f594fc53586c148c3210c8c080efcd0ebf420df1d18a3d9 -size 4302382112 +oid sha256:4d14209714e82397b08ea4ae44b9e74302462264f93d5dcf458b462920da98bb +size 8602554144 diff --git a/model-00009-of-000163.safetensors b/model-00009-of-000163.safetensors index 6e42b70cc22548d38208b39046e3338392f8ecf8..d2845eff9e96c72332c142693b20c08d84daa762 100644 --- a/model-00009-of-000163.safetensors +++ b/model-00009-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ff5721c6750889be83e580b0e299ec09519e3fb6adcbd6f3ce490058554f780 -size 4302347960 +oid sha256:a4866ef2c1e62caaab2d3af73b5cdb7943d0222c54d190f792df7c07e920c6f9 +size 8598786392 diff --git a/model-00010-of-000163.safetensors b/model-00010-of-000163.safetensors index 82b0dd8063cf2cdb28607377aab5c09f00ced423..4fc1e3334819544a7f7172e5aa8b1f170f79ae93 100644 --- a/model-00010-of-000163.safetensors +++ b/model-00010-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1533ea7da047d76918ca06e71805c79d5e4ae15b3d46d2df486cbfab1072e8a2 -size 4302381720 +oid sha256:1795439039e9668aab8f071801ca6195b4359caf35fef3d3d49c8730021556ad +size 8602553952 diff --git a/model-00011-of-000163.safetensors b/model-00011-of-000163.safetensors index fe3a40ad513c0a28a108b7e103ef73d615be2f93..d23c3ef99724556277162f8332a276e45f0d68d2 100644 --- a/model-00011-of-000163.safetensors +++ b/model-00011-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0f5477531751d112e6284b08f399f2f848c5fac203eb77f5dbe6825ff99d42d8 -size 4302382136 +oid sha256:cf12bfcbf23a0bf902a8063e05fbf94aff9eeb7500b105efb5a0f96984a85085 +size 8602554152 diff --git a/model-00012-of-000163.safetensors b/model-00012-of-000163.safetensors index 9650e95423ad0646d28125adc1da026dd54b633d..63ec5826b0ff0cd36a3edab11f1469d52d8aba00 100644 --- a/model-00012-of-000163.safetensors +++ b/model-00012-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4f985054e530622211c5606d87ae1b6d28dded975facb701dc0a025d4525bc90 -size 1321583272 +oid sha256:2847fa21aaf22299e57da82dfcfc98b471d03ea1b715f8f08d9263e894ec9840 +size 2642451624 diff --git a/model-00013-of-000163.safetensors b/model-00013-of-000163.safetensors index 6fb68dbed06409a68908cadeb0882c8395a157ec..81d7cfee4c0668ccad92b20129ed145c53787958 100644 --- a/model-00013-of-000163.safetensors +++ b/model-00013-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aeba020edcb35a96ddba8d92ed4b1316f2026dad577668ea6772225f00260fe5 -size 4302314992 +oid sha256:40881a78b1e8c9f1e98f86aa7db77a4f733536e4432445a54771ce8d4cea1c65 +size 8598757320 diff --git a/model-00014-of-000163.safetensors b/model-00014-of-000163.safetensors index ada304f6e7ced7db7b6c02ce4b3fbd2d93543f9f..8816d7d9949ea2011641e8b4bc98b937244df890 100644 --- a/model-00014-of-000163.safetensors +++ b/model-00014-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f4d9f12a0aee0bf6f94e10d18666c6a6ad94b3ee1bf33f37ecb679ed1c031cc -size 4302382088 +oid sha256:630fd2baaa66c181e8aaec475b206345828bace475d1d60eaf9a7a86af42f987 +size 8602554136 diff --git a/model-00015-of-000163.safetensors b/model-00015-of-000163.safetensors index 63ac204f87c249f2abf1eaa8bbbadfcb55544370..fe2330ccb6709ffbf31cbe6ba9a0f693e48dcf04 100644 --- a/model-00015-of-000163.safetensors +++ b/model-00015-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ded3c735c606e9f1bc067f7782b63d701577e59a338b08e3fc49c8fb603be3f8 -size 4302347992 +oid sha256:ef9b5fa3d31f483cb5d65bca6e38281558900b75ac889fb46fa06e441aecf532 +size 8598786408 diff --git a/model-00016-of-000163.safetensors b/model-00016-of-000163.safetensors index c5f03cffef94d7500d0e7882150681fd5a725b33..430cd65dd2cd94eb94744a6ed668b71bc91a55ce 100644 --- a/model-00016-of-000163.safetensors +++ b/model-00016-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:65126dec37ddcaad6a361e7256d7c5d2fb390e11f891f967e32508320f288f40 -size 4302381688 +oid sha256:1a07ff2eea090b50ad6b91fb75a1b7024ea81fdfa86ef7ec42ae2495868baf90 +size 8602553936 diff --git a/model-00017-of-000163.safetensors b/model-00017-of-000163.safetensors index 245e75f7b4b3755ea04c4ee6c84d29040419191e..063f9fc9c32216f7a73cc40be3f2837a14ddf140 100644 --- a/model-00017-of-000163.safetensors +++ b/model-00017-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0919e72baebf3b268e24a76343e7c8c0cc9ce7485e0b10f1ab0cc19877bee049 -size 4302382136 +oid sha256:cd64a3afb2c3b91b67a48ac9e5dc432bebc612072a9866be91c507e671179431 +size 8602554152 diff --git a/model-00018-of-000163.safetensors b/model-00018-of-000163.safetensors index a32be73fa40ee8bf4fc97caa0b7d30420257f931..d61a66b1e6e9f2b799ad5eeb7038fdaec25590a1 100644 --- a/model-00018-of-000163.safetensors +++ b/model-00018-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ab55b759fa61688e5cdbfc0e76426e29eee60cb7dc4098a505268bd8508105c0 -size 4302347800 +oid sha256:d1550c1ea764cdf1856ee6ff282d189b37ddc9680e935875c816eee40e5e869c +size 8598786312 diff --git a/model-00019-of-000163.safetensors b/model-00019-of-000163.safetensors index 1021caf5454200bd34633ec7fc3bb169f40c0006..313d1978455bff177eb7b9465149e3ed13e06ca1 100644 --- a/model-00019-of-000163.safetensors +++ b/model-00019-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ad04d451a23ba6f6f46aaf549ab2c94ae536db3cc451293d2bf86d932d075c42 -size 4302381880 +oid sha256:f6e798b1f96294b4c8fe21bd3441d9876d05a24e17ae646cf924880d8d7e4d69 +size 8602554032 diff --git a/model-00020-of-000163.safetensors b/model-00020-of-000163.safetensors index ef9a4fbdbe318456881bd8cfb0cedc4f96921619..1168d293efbec3bf8428239d4bfb84b23d1a009f 100644 --- a/model-00020-of-000163.safetensors +++ b/model-00020-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:136c023f610ce0f40752907c29137d0ac1c55228cc721e33112d72e1a86b2a64 -size 4302382136 +oid sha256:6c24c9837e75c838ee68bd3db33f6583d012a8b9876149eb52effaffc5863c8b +size 8602554160 diff --git a/model-00021-of-000163.safetensors b/model-00021-of-000163.safetensors index 45f8bec643bfb17f79279cc41753c0e8d6a30133..076eadb483b38b7d43ea046990b246ffb4c69891 100644 --- a/model-00021-of-000163.safetensors +++ b/model-00021-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bdadc13724af4b6fdce0d887a5dabaa9ac2e35f4716a95124f4c9b0161557517 -size 4302348176 +oid sha256:665e6e1a8eeaecf90ef5cca246830ea5b63be16281582aca9a04f3ec53d9b078 +size 8598786512 diff --git a/model-00022-of-000163.safetensors b/model-00022-of-000163.safetensors index 36ea70eee8f91a02a0ad8ef954d8c5c662448838..4c378f9aaf19f40277243239d9bc88e4f1d37cc5 100644 --- a/model-00022-of-000163.safetensors +++ b/model-00022-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e013066a698d160a033b085d2ab350cc487c9526568c23513af655debe2f353f -size 4302382656 +oid sha256:6be1034d71f6a19a35a25f998ace7d4e3d648b58431bc6849fb10ecef0b84fe7 +size 8602554416 diff --git a/model-00023-of-000163.safetensors b/model-00023-of-000163.safetensors index b1712b462fb8bd394e1d58a7ae4fba2547b40a89..7f6a7cfeea00c6ec1031d472eb531df7200fa3c1 100644 --- a/model-00023-of-000163.safetensors +++ b/model-00023-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d0175c89315c5a7420784da8b46ad83d896b6f1b019ede2e8e9137fc43c5ddff -size 4302348584 +oid sha256:9ea23f670315f74208553df9d951de49a4fb224176e3b5d7098ccfef73659a35 +size 8598786704 diff --git a/model-00024-of-000163.safetensors b/model-00024-of-000163.safetensors index 1799e8a49241129f65a4dceeca985a94e03ed497..333d497e29c270a25b9360d2ceebb4c372413cec 100644 --- a/model-00024-of-000163.safetensors +++ b/model-00024-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7aea2f0b0054e0729a4932bb2ef2f4e4d2a84575c874611bbcacebe641da78b2 -size 4302382264 +oid sha256:45b4e68f5cf91afc62d734a8d2827f15936348fadbfda810459523613df54d8b +size 8602554224 diff --git a/model-00025-of-000163.safetensors b/model-00025-of-000163.safetensors index c71df7838897d1476d4631b01e1fcc2acf88f10b..7a4fbec94d0447d70ebc6b56675f8e906fc7d94d 100644 --- a/model-00025-of-000163.safetensors +++ b/model-00025-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3c4f8ea8cfd59a26c06a4118e98f5519d25f9471c7f2dc09534ec0352cb4efcf -size 4302382720 +oid sha256:3c21a1bf73be1a304bf4335fd2b75761ea1bd6be1c27239789b984becbf316a1 +size 8602554448 diff --git a/model-00026-of-000163.safetensors b/model-00026-of-000163.safetensors index ce382f2efc28864eab0adebe62a3f437e96dbe71..3dcffb8e856290ea00a9b963e974626794b51996 100644 --- a/model-00026-of-000163.safetensors +++ b/model-00026-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:74c70c83c69c8035cce7f760b179b7ca279236ab439d672d298b8d27a92113ae -size 4302348392 +oid sha256:97f99c8f33e134f633c37a2c755d40a9b5724d293d9f02a5d91c08dbf5b6463c +size 8598786616 diff --git a/model-00027-of-000163.safetensors b/model-00027-of-000163.safetensors index 0a48a9717b2a9ada727d8dcef442fe4907564be4..077efcd10b0139a09a8ea72cd49d6b3797df9ca5 100644 --- a/model-00027-of-000163.safetensors +++ b/model-00027-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a9d5999b2943768dcc67cad1f8411d8f1e1aeb55c429e513d7789a5cad3152be -size 4302382448 +oid sha256:7bd3e6528dd202fc082942c09842ac44e5fd9d616ccec3148a43afe53f89ddbd +size 8602554312 diff --git a/model-00028-of-000163.safetensors b/model-00028-of-000163.safetensors index 0f2f5ff5965286a2253bdb70e4b4e8ee4c6b0f57..5664127d4b09a5fe7e32cf6c7ed362629f247987 100644 --- a/model-00028-of-000163.safetensors +++ b/model-00028-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3d08de67222c0b2e1d91e69dc2afaf719dcd43516a286ac9be33d3e95261892 -size 4302382720 +oid sha256:d0d206e534983d48c59e6c9889ad948062f505546aa17685dff84804a163ecf1 +size 8602554448 diff --git a/model-00029-of-000163.safetensors b/model-00029-of-000163.safetensors index f2e4132752ca6046eb9b30d3345d8b70b84805d6..e7cb469b7216b9f1462adf4e99e24916bec28fb5 100644 --- a/model-00029-of-000163.safetensors +++ b/model-00029-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7984feb281a1ce60f706eeb95e5190ca228a0217e5bd693addeb85d308e53d30 -size 4302348200 +oid sha256:26ff62561debd8c311508403dbad8288f05c21d9c949d73841a2fd8c2fa52eb4 +size 8598786520 diff --git a/model-00030-of-000163.safetensors b/model-00030-of-000163.safetensors index 88deffdc7631f63d0dbf4df4ebc0afe02a0dc3b4..33dfd4aa657aae588b5754992acd81ad32d93d4d 100644 --- a/model-00030-of-000163.safetensors +++ b/model-00030-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9ddf8f8cc2330c91beddec149d5f256bd54c1b501a0b6d205ab2afcba76de0da -size 4302382640 +oid sha256:adf9603677165b94712a40c1762e68baaf84b403a8ac6ba858d7124616492e95 +size 8602554408 diff --git a/model-00031-of-000163.safetensors b/model-00031-of-000163.safetensors index 0f8992c8dd2378804b9c6113b3f36237632e152f..3f77d7ea855d18134a0eea43e96d3ffcead22241 100644 --- a/model-00031-of-000163.safetensors +++ b/model-00031-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:72eb06264d09a343bba922c11ad90ccba018f52f4678a2d951923672ecb246a6 -size 4302348600 +oid sha256:f1259369545baf65d39e51abc2b836ba8cc94ecaf8420501c4cedc7086ed1a70 +size 8598786720 diff --git a/model-00032-of-000163.safetensors b/model-00032-of-000163.safetensors index 247ea2d6a0bd6ca9f928b1b9c83eba5e8835e887..14a3282c33c09222980cae1260805d0beccd0e00 100644 --- a/model-00032-of-000163.safetensors +++ b/model-00032-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c82bf8f9a875f472a590aa80bbaa4da17d778a41bc35b042363c7f2b4fcab80a -size 4302382248 +oid sha256:fd9e06d518b2acc79da78eacdc33a770e59000740595c4e42037fb4093ce4c97 +size 8602554208 diff --git a/model-00033-of-000163.safetensors b/model-00033-of-000163.safetensors index 02b3549df5903a4dff3e88ae56d210180d321de8..23b6e9b882f54a5e78c49cd02cc28de49dc2b62e 100644 --- a/model-00033-of-000163.safetensors +++ b/model-00033-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c95969b504e6cec53e981bf224c8051b3808b12666f5fe1b8ebce720f57cd62f -size 4302382720 +oid sha256:0097071ff088e72b2b68c27bce15c7dc00b7a3acf29d8b784c4211d5e92c3af7 +size 8602554448 diff --git a/model-00034-of-000163.safetensors b/model-00034-of-000163.safetensors index d77c2e86bb535dd97c10d620ba055f276b77b61b..0376c453fbd79887af4e731620cf85a17d353ebc 100644 --- a/model-00034-of-000163.safetensors +++ b/model-00034-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d549912fa539c15eb2d31b0c81197b09fb288458aabf8d6b1f240b5fcaf0872c -size 1747416576 +oid sha256:e945cfcf728b08964e8d222a160f2aa5ed90d3ee1b7235feb4d37c1e406482ee +size 3493899088 diff --git a/model-00035-of-000163.safetensors b/model-00035-of-000163.safetensors index d51943df9d07aa41d2ef6c7aa7da3e721e337ec7..4d8d4ac134847efeddab3e980fb24c7d4e9c66ac 100644 --- a/model-00035-of-000163.safetensors +++ b/model-00035-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:110b10ce1ac78868a426f5960d2037398995d3e23722a9d5cff2d85ac4b4463a -size 4302315568 +oid sha256:312fd1d6b0101746cb478519eb9c0d8fa9039ee8e388a28a7adb895f6d464bf9 +size 8598757608 diff --git a/model-00036-of-000163.safetensors b/model-00036-of-000163.safetensors index dde21f628719d47f6f5739e6a4cfcc6defcdaf0d..985e2480fd9ea8b302724c82f454889de21a6db8 100644 --- a/model-00036-of-000163.safetensors +++ b/model-00036-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:80dfc11f732d16b60d7e150ec6bffe84cf6373f9963383fc1da6ec1491a04b72 -size 4302382672 +oid sha256:6b4bf1884af3e2272f3485989feaa2c35764e7dc676b9828b0fe152d131d57a3 +size 8602554424 diff --git a/model-00037-of-000163.safetensors b/model-00037-of-000163.safetensors index b389f2ce44282f19658ee993042d452b310ee6e1..308cba43de14e1d0ac1dc0cdd6405a7b73e8dca9 100644 --- a/model-00037-of-000163.safetensors +++ b/model-00037-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7475424d577cdbd86225777b4ceaab9cafa74511ba55f493f7f487b9706fe88d -size 4302348568 +oid sha256:b5f16bf5d49dfede70ff32f2928ce551bdfa0886c3f4d5d16c96fc29b7f2ea9a +size 8598786704 diff --git a/model-00038-of-000163.safetensors b/model-00038-of-000163.safetensors index 42c6948e89d1ba280a3c7443f2f0522bd560b83c..dc5cfc5a2813026a8025ad9ace7127207d26acef 100644 --- a/model-00038-of-000163.safetensors +++ b/model-00038-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:83a71a848794efa1c7f97e9e7a6e6f55a9cce95add7656de0000134e5cfc704a -size 4302382280 +oid sha256:468bfb987ef42643c786d7186396bdda85f4d25645d9a31e790a0d8bb4b44c87 +size 8602554224 diff --git a/model-00039-of-000163.safetensors b/model-00039-of-000163.safetensors index 63f0e8e4e8a1d5d7a6e77434dcfdfd628edaae56..dd2141ce9af6b6311e5101006409952dd816644f 100644 --- a/model-00039-of-000163.safetensors +++ b/model-00039-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:271ec648451c8387511173eb0d83f98b514f730076ee9cad632b923e70c304be -size 4302382720 +oid sha256:5c4a9a0cac83f04222675eccee99896a97476d4cf62e67970d79610e4b9edd06 +size 8602554448 diff --git a/model-00040-of-000163.safetensors b/model-00040-of-000163.safetensors index a95dca32d47d94f52acdb784408e76351d1c1e5e..f1ecdb45f35b31a7d61c9907180f79bf58fb5cee 100644 --- a/model-00040-of-000163.safetensors +++ b/model-00040-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e547cf5d0ac39457bfcce969740b2e31b4a473279c5142a875cd3c56152d3d9e -size 4302348376 +oid sha256:a4ed30bbee0d4375654ae00a224d904182b43ef52429f673e92ccea1751499a9 +size 8598786608 diff --git a/model-00041-of-000163.safetensors b/model-00041-of-000163.safetensors index 90876a813900945a11af9e838b66824a7ecf9a22..b78c5eede247fd014c90b17afceaee6fe325bf74 100644 --- a/model-00041-of-000163.safetensors +++ b/model-00041-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bb81456fccb3593215a1417ff4bd83e6a18a5156f43266fe40968bf5680cf968 -size 4302382472 +oid sha256:7add203ee94d361212f1ed95104362fe17c3bb6def0a5f3c4dfc55d65cee1355 +size 8602554320 diff --git a/model-00042-of-000163.safetensors b/model-00042-of-000163.safetensors index 907aafeb085ac103576d2feb83941ae33f828c15..86de11240be09b54dec7241ce7cb112948a73cf2 100644 --- a/model-00042-of-000163.safetensors +++ b/model-00042-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d37f968c691f7ca717155328596eab59ffcd356d48dca5d4451f9e2e262a6056 -size 4302382720 +oid sha256:2314ac6ab0b65bbd02b6c20c17fca9701c730c3c9467f5c0a5301f185334a442 +size 8602554448 diff --git a/model-00043-of-000163.safetensors b/model-00043-of-000163.safetensors index d907b23e05d0a2d02195cb2ac7deae4cf1f656b9..6eda94fd5facb2210221622a8d6cba440ec960e6 100644 --- a/model-00043-of-000163.safetensors +++ b/model-00043-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c31b7cb0d0e6761fec2ce693b99059802b055a51cac5d7e0485d214517af4cdf -size 4302348184 +oid sha256:2806bd67ba768691218e8d8932bf6c56eaeb4290945777233fc34bbd91013a0a +size 8598786504 diff --git a/model-00044-of-000163.safetensors b/model-00044-of-000163.safetensors index 3df2d730532f991aeba7ff1a2998cdb0356ae35f..6655c92120363f70af1d0911eaf7d200b26486e3 100644 --- a/model-00044-of-000163.safetensors +++ b/model-00044-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:224b741d367e4946c1fe35429ad877e640a7697c9b86fc619c0f1b4e57e63125 -size 4302382656 +oid sha256:18f2ad4dafbe52517ceac1158a033e71c8c2f5984b047b45ef64e8aa7782bc64 +size 8602554416 diff --git a/model-00045-of-000163.safetensors b/model-00045-of-000163.safetensors index 999738ec725e08d79dc00e16c04f105d67e155e1..8e605fa1b8fb33aad80fde892070d85e728b26d5 100644 --- a/model-00045-of-000163.safetensors +++ b/model-00045-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d205fd835afec706efad9b7349b92bc098e1e21d7c4c283ec7aad45423d381c8 -size 4302348584 +oid sha256:f0f6ef12b89c5847ba4cdebd40c240dd7719fb007acb1876b7736e44b530afaf +size 8598786704 diff --git a/model-00046-of-000163.safetensors b/model-00046-of-000163.safetensors index 77af1f238a1bd47178c05d511cac8e26d577849d..6e481a32afa0e6cb2bb36a5cd5c34e0a56fd7ff8 100644 --- a/model-00046-of-000163.safetensors +++ b/model-00046-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cf167f9e7c7b2c5a91d6af1a2a4b3d837693c751045a767b7754459ae0bbb15c -size 4302382264 +oid sha256:8210ac92c6c04e166fad21c723a9d5510d1a1ee0e42cbd119e43166d5cc5e43a +size 8602554224 diff --git a/model-00047-of-000163.safetensors b/model-00047-of-000163.safetensors index 1ba92e29abf03a0368a83b76899af99c306ae6d6..8ed80d07e36674eb98e79d493079b067759a54fc 100644 --- a/model-00047-of-000163.safetensors +++ b/model-00047-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7a6aea045400e3c788f4980e51b2eb5fade7598e98f2d488b623ba9eccf9a9ed -size 4302382720 +oid sha256:63c3fc0080b7f46cae7e363732f22fcb9bd53dbe3634b015e3eeea4a6d1280c0 +size 8602554448 diff --git a/model-00048-of-000163.safetensors b/model-00048-of-000163.safetensors index 71fff10c56c64713daef0630da829eece1646b7f..bb5a3c8c5f743e4a2af3052b4f279ff8b88a96f6 100644 --- a/model-00048-of-000163.safetensors +++ b/model-00048-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:495fd0dbadbc3cc87b48470bc17d08c312668e54d731c498ae9a69b19354c4c4 -size 4302348392 +oid sha256:ed2dafb36ee2001b2c8db6f7e2f93bf3f2fb6ce61337cdb413854e8812607789 +size 8598786616 diff --git a/model-00049-of-000163.safetensors b/model-00049-of-000163.safetensors index 45d33cb30188ba5e3235fb4317ae27da21ac80d9..3a5746af40ab10d18c563800482b05681ef23ae1 100644 --- a/model-00049-of-000163.safetensors +++ b/model-00049-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:49f78faa1b3a5dd74244c87806000e8cc53a75c5d904f40a7e84eecfe0c43882 -size 4302382448 +oid sha256:109c54d8214eb6eb6046d67360913846fd0a58eed6149b69d8c339c1344e1066 +size 8602554312 diff --git a/model-00050-of-000163.safetensors b/model-00050-of-000163.safetensors index f71d1bb057af54664841cee3101b353b8b514250..ac1cbcc1b9b28db7e01958632e0193dfe5f7398c 100644 --- a/model-00050-of-000163.safetensors +++ b/model-00050-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:96def4741865d745e61ce0aa0bd0ac5596ec21b38d78772122db69f5ba2c26e6 -size 4302382720 +oid sha256:c8f3ce5dbc7d63cc56016dcd0d964454d6cd65ac65dddb20924d513656943b56 +size 8602554448 diff --git a/model-00051-of-000163.safetensors b/model-00051-of-000163.safetensors index 7d6de6121f4bce4844398d588398d51986266dde..d08035d4ef94be71f3c039f42b9b80f1928c78ca 100644 --- a/model-00051-of-000163.safetensors +++ b/model-00051-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:50fbf38ff4f43faf80a5c3960398618ee264d6397180fb67d813a56708f4607c -size 4302348200 +oid sha256:bd8b6871e712cff50196e61d729ddf1094c9b05f49ea118dd7de3e96895f7d88 +size 8598786520 diff --git a/model-00052-of-000163.safetensors b/model-00052-of-000163.safetensors index ba542dc06dbc6614c0ff972dee0032ef9600edfe..664f4d55960364d79a9463ace651789a2c1648ae 100644 --- a/model-00052-of-000163.safetensors +++ b/model-00052-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bfa6fe30fe85598e443b13da1785c4cea7e5914b3bc059e0a73bac34acfd9486 -size 4302382640 +oid sha256:ed7ad15da14828e091b3ec50570c4131ec548207b658d440b9fb19583b963d54 +size 8602554408 diff --git a/model-00053-of-000163.safetensors b/model-00053-of-000163.safetensors index cff423e218161050920e168db355da7ca7fd4281..80cd149e8987d128282bf9c5ed286f25db16c763 100644 --- a/model-00053-of-000163.safetensors +++ b/model-00053-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:76b4cb5662df06a9c923eba4505173e482a395ae481d05fbdabe038b2c4c615d -size 4302348600 +oid sha256:a5a3d58a2e6cf4a0492f0de9471acadcacfc66f0a658c713d08db5639a79e1a3 +size 8598786720 diff --git a/model-00054-of-000163.safetensors b/model-00054-of-000163.safetensors index 6b8e5c483c89627426c4c65e02942f0fd04dbcad..44c7c3b53048a3c02850a1cfb9983e4b5531c696 100644 --- a/model-00054-of-000163.safetensors +++ b/model-00054-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:287cc7664a2550e538658bfd3e8b31065b160960e4b124451c44da966bd30899 -size 4302382248 +oid sha256:9a008f7daa3f03164dbc6e408d9c525303cbb10371ab0cc9ed3bb960d4ba01be +size 8602554208 diff --git a/model-00055-of-000163.safetensors b/model-00055-of-000163.safetensors index 7e9218d1cf625da2d425c9ef7e892aa2e391ed04..0ca188fa53176e9c966e95b5d1bf73539ba6eed2 100644 --- a/model-00055-of-000163.safetensors +++ b/model-00055-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3cbc230da43f4621c5aa09cb98d45b2b0bae793c820c57e1c30d0a4b50f99899 -size 4302382720 +oid sha256:a3172f319a1712c6601a27655a40f1eeacddb2a9ae84417cea142706a8630f75 +size 8602554448 diff --git a/model-00056-of-000163.safetensors b/model-00056-of-000163.safetensors index a9b57b3ec67a5cd073005297349db652a7252c8d..1aa3f3cb8c51635d1363e3462a21c234010f9e53 100644 --- a/model-00056-of-000163.safetensors +++ b/model-00056-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5c4564fb09a95567fd0056fba325682bd280a16ab5cd556146b03e825fadd409 -size 1747416576 +oid sha256:fe8f44186c53b4405a452e71201d5900868147e9d51350da80bb2c2583923265 +size 3493899088 diff --git a/model-00057-of-000163.safetensors b/model-00057-of-000163.safetensors index 589c8748807547d6667a7e2eefeaebcc85719a5d..ec5012b9dc82a7d9bc0948e482bd5082a557e713 100644 --- a/model-00057-of-000163.safetensors +++ b/model-00057-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:42c611df18127e68b183d83d426f80c981a46a1583e6c8547b820cb2cf11f9e3 -size 4302315568 +oid sha256:212d6e1c2b6cdfe77b75f79138ebbf8bb09d4b71a8c13e64380774243f759018 +size 8598757608 diff --git a/model-00058-of-000163.safetensors b/model-00058-of-000163.safetensors index 546bb6d632309675ddcb4ea25215de19acb68ab7..d94c2fef271102ee88f851a53ff91b61c6bf075e 100644 --- a/model-00058-of-000163.safetensors +++ b/model-00058-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5c96a41c8c6214d702b42347515f9afcdb49639bd24847b89845822a0e7fc536 -size 4302382672 +oid sha256:417e7bb57ff438e24e342c8d8469dd9bf17e9149e29adc675fc1997bfebcc3d7 +size 8602554424 diff --git a/model-00059-of-000163.safetensors b/model-00059-of-000163.safetensors index 8987c1c39ddcdb27a1571edb93f57acbd4a1d134..171a75537e4906965ef26c9a492bf207e69c49bd 100644 --- a/model-00059-of-000163.safetensors +++ b/model-00059-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:82cb401b037eb3a5d1fa2ddff2f6aada163be92a5ce4263efc29ea1b0abd0dd9 -size 4302348568 +oid sha256:f37f8fcff837e750a595d0ce4651fd40ef74fd80cc9cc27a5eaea1b037a2a8ad +size 8598786704 diff --git a/model-00060-of-000163.safetensors b/model-00060-of-000163.safetensors index 7b4ef1cb62b5dea9b04d54bd13aaad197437fe90..5189a00bd417478dbc07b6b70c4af3bfb17664bf 100644 --- a/model-00060-of-000163.safetensors +++ b/model-00060-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:39c30132687d8e8d8a28962396282b8b59c41801d7f402575f7c523355d4ab8f -size 4302382280 +oid sha256:3fcb69e9b712f536bd3ea2d56744046d610a555adef78571d61cb42cdc52781c +size 8602554224 diff --git a/model-00061-of-000163.safetensors b/model-00061-of-000163.safetensors index 938e68de52680a1840f85ecf850577b43b072665..25316f5ec5de2115350d172741828dd467633740 100644 --- a/model-00061-of-000163.safetensors +++ b/model-00061-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5268560024a2acbe0c8041757da473a6f3a222649cec4466242e53fbe03d93c6 -size 4302382720 +oid sha256:b25cbbc476784e8362615664a90c58317f2a1b159e1b72800028fcc33c51fa29 +size 8602554448 diff --git a/model-00062-of-000163.safetensors b/model-00062-of-000163.safetensors index 55426295cf0beb79d893bc9b2623fcebb7d6a63c..f4eac15c8a6d58f8bc4e197db9b195a35e5ea536 100644 --- a/model-00062-of-000163.safetensors +++ b/model-00062-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6268a28d3c0acabcda03273193ec56d1c55d08e3e41cf03592571d6731d003ae -size 4302348376 +oid sha256:0750416611a3a829a07b8bab6651607d111b4ba7e1682670c50db4fc8c8f16b5 +size 8598786608 diff --git a/model-00063-of-000163.safetensors b/model-00063-of-000163.safetensors index ea499dfe341a8dd1b1a14d636f77149f33f7b479..b4b718374a0d9a4904f889b075eb0810bd480e8e 100644 --- a/model-00063-of-000163.safetensors +++ b/model-00063-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:69302874728ec3b3b23d85ed8c38453f60dc6b939e35bb0933aba81464e88d23 -size 4302382472 +oid sha256:1382521c572c1edca300dd8dee904ca04cbbfa9fbbfd0c7cb9e00bfd17c63d1f +size 8602554320 diff --git a/model-00064-of-000163.safetensors b/model-00064-of-000163.safetensors index fd9b61885b27904cfc50094454bec50d01c36ad3..0e3d0170287e1138dac60619e7131c7971451dad 100644 --- a/model-00064-of-000163.safetensors +++ b/model-00064-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c04edd05f12fc18584f03a3c54519775bc2fb7e5396aa711f31d7afb3725191a -size 4302382720 +oid sha256:4a678da1d71a9be7cd03d5ef60a053d2ea01b7bff90305af790923ed8d8f865b +size 8602554448 diff --git a/model-00065-of-000163.safetensors b/model-00065-of-000163.safetensors index 82540cbf6490916f68a3c579c8b1c322035484c8..c5e4795b0bfb202c734d7f0a36d4b38460daeb0e 100644 --- a/model-00065-of-000163.safetensors +++ b/model-00065-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:01457640fc6800a333f1abf5ec152fd9b3d4738f0265a8d9154aa93a0f97b8fa -size 4302348184 +oid sha256:51076fe0dd334c8c417ddb498f186da2a2f38a42ce443bf92e62c40173d101ea +size 8598786504 diff --git a/model-00066-of-000163.safetensors b/model-00066-of-000163.safetensors index fc6ba0a4462efd0809c980db7e45ba166696161f..7962d0d9b6a5ecdc9b939191a30ae8f96a3c449b 100644 --- a/model-00066-of-000163.safetensors +++ b/model-00066-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c21e9375cb802f161772686c446e03e6f88e4841781f625665f0023c83502593 -size 4302382656 +oid sha256:92af81cf795775272e553c5baf3295e5875a4855ba32f081dfdf45420865077b +size 8602554416 diff --git a/model-00067-of-000163.safetensors b/model-00067-of-000163.safetensors index 2d4cc774a4614313694869fcc59cb2f3d8321045..4af1588f758e65425f0aec9899dcabee66077277 100644 --- a/model-00067-of-000163.safetensors +++ b/model-00067-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:040f071e3031c9d5306e7c21d56257c1892b4a65921787f886c30b978193808a -size 4302348584 +oid sha256:df142c5ca4be6194c8f4ee9c8887bd77ef3e038bde98ce38d1637cdd310ed4bf +size 8598786704 diff --git a/model-00068-of-000163.safetensors b/model-00068-of-000163.safetensors index 08c99f8b98b29ee19ed8ccca734d932ae378196b..1cae0b6e76ecfce70930b76b3a9e46ab2ec5ddd2 100644 --- a/model-00068-of-000163.safetensors +++ b/model-00068-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fcd388b47a62ec90b772f6f0d3cb92891b8f932077afbc2d7b326fd641c23320 -size 4302382264 +oid sha256:849abcb52c32419c93a20dfaf42b0f09966469a060122fe26d594c9faaccadcd +size 8602554224 diff --git a/model-00069-of-000163.safetensors b/model-00069-of-000163.safetensors index 8e30346740346011567d0387c51f377f9bdc62bd..fa09d9c82ab45112b6cad70c478a91d234ecb549 100644 --- a/model-00069-of-000163.safetensors +++ b/model-00069-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cb2117e003cc2be38fefead98e0534403db7d6b2828fa9baad70138121f11f48 -size 4302382720 +oid sha256:0b6b493ba75da6e1d6ea920c43b6791e09bd8096606512eec607dee6780d4076 +size 8602554448 diff --git a/model-00070-of-000163.safetensors b/model-00070-of-000163.safetensors index 0e4ac6663eb1a4b5e1aec4f0facb1364ef7ed93b..2051500b0e902086c73a856c382579996587a450 100644 --- a/model-00070-of-000163.safetensors +++ b/model-00070-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ed2b3e523a8b242fc0384613d4653f4cf9101e7470ff88379754fedc5b374ad -size 4302348392 +oid sha256:d45fe924c4a9bb9d909711f104fe4244093f4aad5a7df7922212bb7550ccfc0c +size 8598786616 diff --git a/model-00071-of-000163.safetensors b/model-00071-of-000163.safetensors index f2b8815c59006735be25b0fbde9efcf21c5ded96..f0c0b06a45c0240ef6d98cd0a6f1ba62b42d1d70 100644 --- a/model-00071-of-000163.safetensors +++ b/model-00071-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e561a73587f56b7765d03a81b18085e2995338c09bd668aa64552e57037abb7d -size 4302382448 +oid sha256:e8838e64ee2930c621b3ad80fe520d3beaa0e74daa2f7078fb519cedd7fb5d5c +size 8602554312 diff --git a/model-00072-of-000163.safetensors b/model-00072-of-000163.safetensors index 2ca9664571a1beb8c4d25514cf65c28909a36cab..96bdf63c3e260a255dbe13a07027f3ab6a48073f 100644 --- a/model-00072-of-000163.safetensors +++ b/model-00072-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b5a4f861307ab5619928c3a28c1949cef43638de5a47f3fa73605c7edf996f7a -size 4302382720 +oid sha256:7a563efd8da1794d1405360d187a7d646dc3460aeedd701be4b2074306081de5 +size 8602554448 diff --git a/model-00073-of-000163.safetensors b/model-00073-of-000163.safetensors index 16f645ebb0148ba1676f38c66735e150cba37040..d2f358e90453a811d3657073a2ede114a1d43bfd 100644 --- a/model-00073-of-000163.safetensors +++ b/model-00073-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:43018b12615c92a64312cfaf0465a343e3c291f1c40bf9312cb6e4fce1e38830 -size 4302348200 +oid sha256:da584d02f210930a4d399421c9911d2225061b048740093b4960b2cedc1396f2 +size 8598786520 diff --git a/model-00074-of-000163.safetensors b/model-00074-of-000163.safetensors index 44fa3eff621f259e1800af7e35207ed8e91429d4..5d933048dd27ee5887b127bef4cfd8c86bbbf0f9 100644 --- a/model-00074-of-000163.safetensors +++ b/model-00074-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8d15bd983efe504a8d2823a64ba77d74271cf4eee02a08d0119864d24fbae104 -size 4302382640 +oid sha256:ac53993dba09882ed57b0f82a91deaf79138d6c322fce629a44866b715046cfb +size 8602554408 diff --git a/model-00075-of-000163.safetensors b/model-00075-of-000163.safetensors index 5ded5a4b62f764e169a6b9b38824b658930a9457..f241e036376fd0b9af73c7617d1b7ba87d606be9 100644 --- a/model-00075-of-000163.safetensors +++ b/model-00075-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cdbf6c697c7abe1a92d15ec825193f047d3c262492e5780942bd62df5512fdc8 -size 4302348600 +oid sha256:c1b55bece2de590bc674bd00f88c66d95043e940a783e33185d13a00862b6b79 +size 8598786720 diff --git a/model-00076-of-000163.safetensors b/model-00076-of-000163.safetensors index 135731e51942f594db9ebdf5d26fdfa23353828d..1dc03813a73e3086af49b4159daffdcd6733bf76 100644 --- a/model-00076-of-000163.safetensors +++ b/model-00076-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c3733153525cf7775f6f1ecd5c4a7285f742a74ec9d9390baf06bb0ddc28fa17 -size 4302382248 +oid sha256:5e8197740887ef2ff9ab580294af81934e11d75989f3e6b33757eff92209eb07 +size 8602554208 diff --git a/model-00077-of-000163.safetensors b/model-00077-of-000163.safetensors index 8667f169580061060f60ca33793b081b60d9ea02..5b77d4ead71392d08ad232a07ab5af6ae38c6b80 100644 --- a/model-00077-of-000163.safetensors +++ b/model-00077-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b6e13a57aac39b76373491250e104e1493e75b1cf40ac24b356d124d23c12b5b -size 4302382720 +oid sha256:d1c6cfecf66c584616768b7f35cdca96e83c4ea9d9c594259776dc8e0305fd6f +size 8602554448 diff --git a/model-00078-of-000163.safetensors b/model-00078-of-000163.safetensors index 6f747c3771af10cd40c79019fed5a931e66e719a..03352104343226628e2cd1fa8091ac094f5349b2 100644 --- a/model-00078-of-000163.safetensors +++ b/model-00078-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f4e38512e5cbb087f4afcc9c693e5cd48ee04d5d286b7e33e4e2bb00e55a8e15 -size 1747416576 +oid sha256:a292229f6be61a883bc6f16625a76eddeb2037487f51c07a5a615d1122a6b82d +size 3493899088 diff --git a/model-00079-of-000163.safetensors b/model-00079-of-000163.safetensors index 695ca22c7d1b1c6c64cab285d57dc0cd82c2dfcd..c933bdb81986a3a9bbbc4bd7867f02b5ddd1ce15 100644 --- a/model-00079-of-000163.safetensors +++ b/model-00079-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:75ef908363946d71fa98d65dec8c175a729194854de76f76c32215537994bbff -size 4302315568 +oid sha256:bd5256eb4974d778c9de98d10db16046c7d3792dd53ccc3f6914f7f6fc748359 +size 8598757608 diff --git a/model-00080-of-000163.safetensors b/model-00080-of-000163.safetensors index 9c64d98838494a00eacbed7b9e117999bf4b749b..147adff482b45275e5fa0c302549007a9e051aa9 100644 --- a/model-00080-of-000163.safetensors +++ b/model-00080-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:45f2998a098bddb43815ebf73bae709c5b5eb7239f86642422fd3576bd0b7f0a -size 4302382672 +oid sha256:20e0e2ff32ca5cd9a76d0f4dc2a72118c61d85299fff6237c3d31693121b709c +size 8602554424 diff --git a/model-00081-of-000163.safetensors b/model-00081-of-000163.safetensors index 731b7d2dcc82008f8164983bdb48840903363e70..4d52fffd141cd53b63255f63d42848445c255227 100644 --- a/model-00081-of-000163.safetensors +++ b/model-00081-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1ddbbaffdcc6dd651d68de3596fcd0ec71c688040df5a40793264e75c5c15df0 -size 4302348568 +oid sha256:b7056cc113488848e257719522c6b11affc7a1dc57a12ee337ea52757802fdc7 +size 8598786704 diff --git a/model-00082-of-000163.safetensors b/model-00082-of-000163.safetensors index 9b8d114062563b1cb3ca50c09f26f5da35df7132..306c43a6d4784b84ea41edcb1371d6f723047f1d 100644 --- a/model-00082-of-000163.safetensors +++ b/model-00082-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8661446c066e89475a207aed7c58bef16948fe0ea3a832c486a69ec12325f8fc -size 4302382280 +oid sha256:0371764244ab5f9e51324dcb7a0bed6fb83233c546199a04c17cccfd0e1f4210 +size 8602554224 diff --git a/model-00083-of-000163.safetensors b/model-00083-of-000163.safetensors index a7a054741d5a705c283c05632dd1170a58440d29..299046a0c8a90158e6bbb1939f410cc93a8a83c9 100644 --- a/model-00083-of-000163.safetensors +++ b/model-00083-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c25a777958d3a868ab6b57b6e5d2d9e040a0fa95d8a67c095a21e03a7e1a04b4 -size 4302382720 +oid sha256:f09aad4a78038d6023d3569e80971f9de4846912490b50926e72535af9fbb6c6 +size 8602554448 diff --git a/model-00084-of-000163.safetensors b/model-00084-of-000163.safetensors index edc1696ea2f40c29d5d000e7eaaf5303237de79b..110dacc34d34be73e76dc11f4fba750b158430e0 100644 --- a/model-00084-of-000163.safetensors +++ b/model-00084-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0df8afe9fc329bd69bd0f0349240fe622c8f2de176e680699894e36f0f21c78f -size 4302348376 +oid sha256:78db766bf512e44f7d892a116b5796e0c9cd4fdc03edc106603e12071e4498c0 +size 8598786608 diff --git a/model-00085-of-000163.safetensors b/model-00085-of-000163.safetensors index 9b3b3d34d11ad826426c781ca506cb4b862e90dc..f8b24fc7d377beac7000f397c4e669ba874c5520 100644 --- a/model-00085-of-000163.safetensors +++ b/model-00085-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eb324543ae75744d8d3d6a7e247f0aacd053f78cc6addb16a81201e838b70911 -size 4302382472 +oid sha256:3719450991118be3bcd23753f5b385c13fe2e59fc5c67bfa55550416164dfb11 +size 8602554320 diff --git a/model-00086-of-000163.safetensors b/model-00086-of-000163.safetensors index 917196001e5b82ac0e0d2f78f5e287647cf73440..3707749425010079278bd36a51eefb26e2e3da51 100644 --- a/model-00086-of-000163.safetensors +++ b/model-00086-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2f63d1bb77a82c1f0c2f84f2fdb5c5a81ee8eead300feeb333c3bb52f2f007c9 -size 4302382720 +oid sha256:b29320f02420317323292067d8df53c1f535fcf7c2dc3a62a7e45b95aaaf4f6f +size 8602554448 diff --git a/model-00087-of-000163.safetensors b/model-00087-of-000163.safetensors index b1dc14d81de6af8506a9798ee72ee254c05ab565..c5056099b45204e3682bcd9f854e6e346d56f861 100644 --- a/model-00087-of-000163.safetensors +++ b/model-00087-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7aa71e0c5bfe74f86b67a3adc774acc5fa7e176212424057324cb67b5235da5f -size 4302348184 +oid sha256:34b422dd91b4fa6c7983fcec5e438e3c39a47e0c2e43b4a7f1c085b2509279f6 +size 8598786504 diff --git a/model-00088-of-000163.safetensors b/model-00088-of-000163.safetensors index be4b0654d95d66ac5629410bdc39e2aa0236133e..0b79d87b1d1bc6bfca8aea003de252cf6d8f35e3 100644 --- a/model-00088-of-000163.safetensors +++ b/model-00088-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5740f8e77b3f86fd8c686d5eda884eea8c637a1a4937046f44f988a27543041e -size 4302382656 +oid sha256:d6ae316dd4e289a8b3d0d945b39ed9a06ea3d68dab84dc777abc71bc46b454b5 +size 8602554416 diff --git a/model-00089-of-000163.safetensors b/model-00089-of-000163.safetensors index 603d8369eef75427a2e343e197455ab6981cb58f..1435edf2ed7114910e442328ebe365ad8df8ca75 100644 --- a/model-00089-of-000163.safetensors +++ b/model-00089-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3137b2b82b3d50c80e48e187e6c743d735124bd55a9ecf2b6c5a4f008a9f73a1 -size 4302348584 +oid sha256:85efe31d45c70d1b4bf42f7e34a6b511116303e0586d1a6c3fdbf325dd2645b6 +size 8598786704 diff --git a/model-00090-of-000163.safetensors b/model-00090-of-000163.safetensors index 8cc2572d695a50dab7779377903af1e201289193..ac431f9e42c0c7a1fc07f32362cc50eb8f2a6b49 100644 --- a/model-00090-of-000163.safetensors +++ b/model-00090-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5e7368bc72f3f331d5bb6ab9ca023b42a4423eb21266e21e8d30f1cd70b9cd4f -size 4302382264 +oid sha256:88d82f051736f58a4055cfd2af5c4e9f7c778c95dad747412b550f9c13a312a6 +size 8602554224 diff --git a/model-00091-of-000163.safetensors b/model-00091-of-000163.safetensors index 35f26142a53dee3454ae30fb53ce3ebf718a0b59..3fc47d406081c05b87027b5fb1ecb4d4dc2fe077 100644 --- a/model-00091-of-000163.safetensors +++ b/model-00091-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:951ccb0d80fdd09fc98bbc628173df2c4854cc9be0b18efff224f8012b9a1e3e -size 4302382720 +oid sha256:86dc2465d15200655572f1f91bbba278b60044fdea5a90bd39a0bd1f48913437 +size 8602554448 diff --git a/model-00092-of-000163.safetensors b/model-00092-of-000163.safetensors index c32112e208499399da1dae7ef2c99eac9d0e9d18..96a3db24f3689eb60d93f7ceb758cb4b7b78bd39 100644 --- a/model-00092-of-000163.safetensors +++ b/model-00092-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c512f6f8a69f4528f503841f9982d39c044a5bd077939505e5b763de435502f9 -size 4302348392 +oid sha256:b93b98611a27d2854a283ec25e46802d0d0b48ead24f41db1c06bfc2a1b8f232 +size 8598786616 diff --git a/model-00093-of-000163.safetensors b/model-00093-of-000163.safetensors index b668f2c99cdf5f0f37da20a1be6207f0f54c89bd..f2f63b7790f2e9ed8b582317a86ff81a160a01af 100644 --- a/model-00093-of-000163.safetensors +++ b/model-00093-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d0ad747c864cf1d82eab114117302c23b891a605b062c43e86838a75bd38ef0a -size 4302382448 +oid sha256:06441c0fcb7ffacb6608cbd3e1be314db24020611fc9969cdcf05808181fa5f7 +size 8602554312 diff --git a/model-00094-of-000163.safetensors b/model-00094-of-000163.safetensors index e20b405db99b6f5d355a34e4c19044aaec7ed5b5..b6b4cb4126391bdc4f8b959ea229db968d029298 100644 --- a/model-00094-of-000163.safetensors +++ b/model-00094-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d3bfb9aef946581c145c358c416e687a4271c49848daa7edae10ddd1575b325a -size 4302382720 +oid sha256:59f0dd74dcf0c6eb897087ce7642b73ed57cfa6ffc24d24e484d4cdac0a669db +size 8602554448 diff --git a/model-00095-of-000163.safetensors b/model-00095-of-000163.safetensors index 3a1f4bf2e1662fd67dcc877f63987ad696dfc847..9dbc94dc4a999484503245762d896daea30dfae0 100644 --- a/model-00095-of-000163.safetensors +++ b/model-00095-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:67881b7e5de4ae4be4845c4237ef7e90f89deaca9d7796ac708f6bc5bec9ee73 -size 4302348200 +oid sha256:922e7c98dbb425546920c5c40cedd4bb5a4f0371093e00965555529fced57bc3 +size 8598786520 diff --git a/model-00096-of-000163.safetensors b/model-00096-of-000163.safetensors index 536e20e88df0f2eeb8c8c33f63995ec3a018546a..777ce308b727458de6e3b2267f2bb4048231d935 100644 --- a/model-00096-of-000163.safetensors +++ b/model-00096-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5951c6ff635b0b2b1f4a3bce3158f71ce16b27f51a6e75f2b91296deacb52b9c -size 4302382640 +oid sha256:449c70fabee9140e5f83fae1e26127ad2d8dc30b99d4dd255909c647e4cf183d +size 8602554408 diff --git a/model-00097-of-000163.safetensors b/model-00097-of-000163.safetensors index d9d1a283c8222bb957d483370ec2a26b97070ec9..917f0669bb9d43598646639b8c25ba7c7db8dc6e 100644 --- a/model-00097-of-000163.safetensors +++ b/model-00097-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5fc216781cda6a6d1084745dd016955db9ccc1ffcd1a04ed0d8863cd79f97346 -size 4302348600 +oid sha256:6b4bd62f0299b05d306cbf2a7e8461bc8e1c855362e5b798a53474eeef0f9ba5 +size 8598786720 diff --git a/model-00098-of-000163.safetensors b/model-00098-of-000163.safetensors index 239990ec64e185d99e7d879981b3b6f252259035..20b990af67495d9a5ecae456f7ff79da5185363f 100644 --- a/model-00098-of-000163.safetensors +++ b/model-00098-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ae96e2d119a9bbe62f01f6361b7391a64b6ddede99d1f38c2cb7c47fced17fcc -size 4302382248 +oid sha256:ac399b041d8461d47697aaa4d248acfcd9d404ecd3f3ef0bcc4e45a54cf59d4f +size 8602554208 diff --git a/model-00099-of-000163.safetensors b/model-00099-of-000163.safetensors index c7fa17410b88527c6b96b0a66b8ab8f9fe335b97..e1e69fd7397b7064c7666f47d24339f97b309ef2 100644 --- a/model-00099-of-000163.safetensors +++ b/model-00099-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:57981f8c985177041dab61e39a2d3713904c2c39facd7c84374d068def378754 -size 4302382720 +oid sha256:90c5fac08d2518e996c0c80602affb3a489e691991291469658d4e4979887965 +size 8602554448 diff --git a/model-00100-of-000163.safetensors b/model-00100-of-000163.safetensors index f8621bc723083dd0ae9f83ee6bc61e7683abf9bc..d6d257bcbb4108b1efc5888acec92324f7a55d5b 100644 --- a/model-00100-of-000163.safetensors +++ b/model-00100-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2956dd556a996f6298a4ea79c797aa88ce50bf46826da47bd4d319f2833c8075 -size 1747416576 +oid sha256:821dd678fb7b2c0d561903b216e0c346a1c6f53fa3ba0932e54bdd9662ea439a +size 3493899088 diff --git a/model-00101-of-000163.safetensors b/model-00101-of-000163.safetensors index 4d3bd854ae128a434a3a554f56db2f5a3a9e5350..35d245842f70a4a64b0837048073b450e1a4b9ee 100644 --- a/model-00101-of-000163.safetensors +++ b/model-00101-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c13b0ed6c756b9f95a1fa5d516d51e57b828ff7aa1837b37be010194ee9d4287 -size 4302315568 +oid sha256:328b1bd4bb4f33a2676a7f324c50fa17bcdba1e192dda42ac7dd0379a0324243 +size 8598757608 diff --git a/model-00102-of-000163.safetensors b/model-00102-of-000163.safetensors index 8d1e53b06fbeed15c2e1c97c86f2b0c07b2b66fd..9d5afba4ed5955d52568d2dc7e44adfec7e702e7 100644 --- a/model-00102-of-000163.safetensors +++ b/model-00102-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ea754e8fb9bbfbae5c71e69cb674ba95ad5c6140338d17e656150939c83050cb -size 4302382672 +oid sha256:c790c74327611d69e224a93be86900307cbae315ebd1135cf76374967e1df683 +size 8602554424 diff --git a/model-00103-of-000163.safetensors b/model-00103-of-000163.safetensors index f6c4232cb3b013f1b41b47b322da00f9b27fdfa7..52f995991fc9dfdd30ef0931587117ca2e9d6fa2 100644 --- a/model-00103-of-000163.safetensors +++ b/model-00103-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8d8c6615a04426aa634d675ed5b3168cbab344464148c7c59978b0cf5ad8405e -size 4302348568 +oid sha256:f294323ca5e0dc2a3997a9b5e38ba467e7c45cbb624815ddd56da250edad0f2f +size 8598786704 diff --git a/model-00104-of-000163.safetensors b/model-00104-of-000163.safetensors index 1e8a1165b3cd65be08598420d6915ccc9180af7c..9b2d9f78e150da639d18106b5262a16b26fe183e 100644 --- a/model-00104-of-000163.safetensors +++ b/model-00104-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b8f914bec9b872a5a624d5a0a4d35e75146f186706fcae63f35c9666794ae066 -size 4302382280 +oid sha256:9bf65633a1784acd465cbd85b323cc661babb7ae8f2c7aaf0396b2081637ef32 +size 8602554224 diff --git a/model-00105-of-000163.safetensors b/model-00105-of-000163.safetensors index dd013c4737ce533cdf55e556c5ea5d37a843306c..a6c33bf7417f0c05b763888021cb8f631505ce0d 100644 --- a/model-00105-of-000163.safetensors +++ b/model-00105-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fbbcd10373f9a2dfc33a650a117cf000e7117fa863bbf0835d57ca47ef1c8770 -size 4302382720 +oid sha256:5fde3e634c236fe019dfc7d642f9ec48374d9f64a99fe3fd7798ff0d3ecc4545 +size 8602554448 diff --git a/model-00106-of-000163.safetensors b/model-00106-of-000163.safetensors index e635c4a93ccb6911769837f86fd60b9b3b15745b..052cfc55149d79860a922e2593b131199c3e3853 100644 --- a/model-00106-of-000163.safetensors +++ b/model-00106-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f94500ade500405063e6efc299ef1356eb8e814aba23b1ffc8e520a7a65a28d4 -size 4302348376 +oid sha256:6df147482fddf2aa81689ec4c4cc71f56ec316c48e5876489f1c1d75dbaffb12 +size 8598786608 diff --git a/model-00107-of-000163.safetensors b/model-00107-of-000163.safetensors index 60bb10339c314270464127614d22f6b7b44b9cbf..ad181e1904bb753b08913424df841b85b3b6044e 100644 --- a/model-00107-of-000163.safetensors +++ b/model-00107-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f9acd49a549e874ae346c940dc939144670da931d6f3d3ca69f1de7ae588399d -size 4302382472 +oid sha256:0616f9293332edaaa0a1da3bedfef4357b02ca81847cd098295fbc3bc97b9b3c +size 8602554320 diff --git a/model-00108-of-000163.safetensors b/model-00108-of-000163.safetensors index f64790a9bac40777b990fef8e2ec56538632d1a1..82b2b98c0dbbb4b2a1377bedc939c3e6a6e21391 100644 --- a/model-00108-of-000163.safetensors +++ b/model-00108-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f5378084e6769b6a496be211d5808858149956aca7893d5e928c2772f5f9e476 -size 4302382720 +oid sha256:c3bd711282cb21c8f6203d687452c7ad35989dfe8f4a4a3fc025aea4f69fb654 +size 8602554448 diff --git a/model-00109-of-000163.safetensors b/model-00109-of-000163.safetensors index 6dab80cd64f679840a6c41c56d84886cdf613026..1e5c7e574a9c4cbd5da08d667f9bd485b87fc9dc 100644 --- a/model-00109-of-000163.safetensors +++ b/model-00109-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:820b730ab4882f28492381fd40c0591ac68e276e69450d5e3ed553496dc2a349 -size 4302348184 +oid sha256:69b6f533e0cb63a295cb67fc0304c91943d0d56726f50653428065865fba8785 +size 8598786504 diff --git a/model-00110-of-000163.safetensors b/model-00110-of-000163.safetensors index f48d70fbf2b85e70420488f48ef87f53ac610c80..c4e4c5f43a954078e159f291faf157c226a3a803 100644 --- a/model-00110-of-000163.safetensors +++ b/model-00110-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e37571416f241afcc413442a11ce8896a1ee63aab13b065227c0a04099cb2c15 -size 4302382656 +oid sha256:40dc07bd5944ca471c3307a359cdefa61a75b6905a1194083971fecc53e33bc2 +size 8602554416 diff --git a/model-00111-of-000163.safetensors b/model-00111-of-000163.safetensors index b3ebb2ca5861863b8538399cac2ce98becb5b53e..139e59bea553ea217bee376abe6038f1f6de81c7 100644 --- a/model-00111-of-000163.safetensors +++ b/model-00111-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:605b39268636cae3bb925ef22c34c720840bc6b4ee33366fc5c98e8d8d4a5d83 -size 4302348584 +oid sha256:bfb8e779b3dc2247bf62d771efa696cd6605c19f2b4d77941284e6878550af93 +size 8598786704 diff --git a/model-00112-of-000163.safetensors b/model-00112-of-000163.safetensors index e0c4b99943d4d094266dddbff86ed0c437575b70..d72b2501b0863fa8b444fb57d33b52b9518bc223 100644 --- a/model-00112-of-000163.safetensors +++ b/model-00112-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b7152fa20f96fa500166c52abdebdfd00c19871d81f235166522d5169e7263ce -size 4302382264 +oid sha256:cced230207cf140428c3a727104fe17c848c98fa25572107b271c009051f29b1 +size 8602554224 diff --git a/model-00113-of-000163.safetensors b/model-00113-of-000163.safetensors index ef6c3a001f24d7396865852c8afc580b45c5891b..4dd48d7343394607482553b08e493797502233d0 100644 --- a/model-00113-of-000163.safetensors +++ b/model-00113-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6ea651e865707be3259305153f4e7a06c6f4c6b4d9989bb6b97f92039d7714d0 -size 4302382720 +oid sha256:04828d610521659cd5e40ab32847006bb683d22b78bc4494f01485c9ee0b407f +size 8602554448 diff --git a/model-00114-of-000163.safetensors b/model-00114-of-000163.safetensors index 08d318f242ddd2eb8324fada733e51ee7d2e0a73..eaa9bb7df455054ef9dd0f964c415d6594efd91e 100644 --- a/model-00114-of-000163.safetensors +++ b/model-00114-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c2221d4f48f6deb7c16eab8d7d846ba961c3f74612a9aaf82f4d4e711a156d8c -size 4302348392 +oid sha256:e8d7dbb0c393f8507d449aa78f068f23e23f6bd60be8fe1571f79dff2c3a7e43 +size 8598786616 diff --git a/model-00115-of-000163.safetensors b/model-00115-of-000163.safetensors index d8b4c1f2682a0dc8f2db28b9803d5b5d6dfd749b..541aa4501c6bb14ba332afabc7974bf78da7092b 100644 --- a/model-00115-of-000163.safetensors +++ b/model-00115-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:35f808fc0eb23a376220e074d4463ade7f685eb174a528aac37f56b90a9c241f -size 4302382448 +oid sha256:fe1cc8703dfecac06eedb8fa61adddc51a2faf1a048b3455d7761c30def56511 +size 8602554312 diff --git a/model-00116-of-000163.safetensors b/model-00116-of-000163.safetensors index d6692ca36e2206d602adc33b010a709700552250..accea23d1e37a25fb2936888b37e067fb46f76bf 100644 --- a/model-00116-of-000163.safetensors +++ b/model-00116-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ef8f050ca1cc24dca24f789af6e9c81cb7da3e33163a9dd753bf9ac983799387 -size 4302382720 +oid sha256:3ef52e3b965c05c2f2230f328801c5337f5233b7aa6767e880cee8b2e0afac3b +size 8602554448 diff --git a/model-00117-of-000163.safetensors b/model-00117-of-000163.safetensors index c6743ec75cf2b338450ff2a276dcae0d214f50cd..268587157fe5973acd1ccc92f9885ebdea9520cb 100644 --- a/model-00117-of-000163.safetensors +++ b/model-00117-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:47126bd746d813da5b51f3584ea8e4d87b0bd7fc20c2028ae4187cf9b2d326e0 -size 4302348200 +oid sha256:376a2971ff7639b31120975647f0f9e47b07e8daa317a08a37ae80c73769d031 +size 8598786520 diff --git a/model-00118-of-000163.safetensors b/model-00118-of-000163.safetensors index 1c7f69d8591bae7196b9315dd6cd9029a3bca74f..2af2c0845162a8310734c9f9ca786fe3a2d7375b 100644 --- a/model-00118-of-000163.safetensors +++ b/model-00118-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d94096a4d4ba7efa1c31a630d9e4cb280dbe8d5574c2f9daa9cb845158a6d5d3 -size 4302382640 +oid sha256:2907aa65bb36a8526a4bb5157e0618442eb28a03385d1a31a66bf4b71678507d +size 8602554408 diff --git a/model-00119-of-000163.safetensors b/model-00119-of-000163.safetensors index 3a3c680164c1c0811e9606e6fe26ec098ed36f37..32c9efe3838161cdde53db1e9c7a736e8cff60d2 100644 --- a/model-00119-of-000163.safetensors +++ b/model-00119-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:94d7b0e6a2393122e0cf50556d05ed050b2016f71cf09a8265c89361feff9e9b -size 4302348600 +oid sha256:1476cb4c51afc7df98781f53790b629d3583953d95abfef56b477dd79066294d +size 8598786720 diff --git a/model-00120-of-000163.safetensors b/model-00120-of-000163.safetensors index aa75c596f763e9535d142624fbd205119e95cfbb..30bc196ef61d46e821810c4479cf67dfe7efa077 100644 --- a/model-00120-of-000163.safetensors +++ b/model-00120-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6620c4a6a5c7be243d4600d93ebbc163f4fdc67637df0f13363f8ed79912e43f -size 4302382248 +oid sha256:8b51267c70efa58152ab3da730b734854a373a955a7768fa9444f4808d92769f +size 8602554208 diff --git a/model-00121-of-000163.safetensors b/model-00121-of-000163.safetensors index 1ff76c813c27809ce15090e2834d50732a1b2f48..bab196503bc8cd83656bc5f9a89ba6c530b41f88 100644 --- a/model-00121-of-000163.safetensors +++ b/model-00121-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8d4878de8f54e53ebdc2e29ad7c2eac11db177ce4724dffdbf5be53062104230 -size 4302382720 +oid sha256:aad1d354dd247f7f0baff137d70afdfbe4d069d2b4a5d7317ad3c98b987dfb79 +size 8602554448 diff --git a/model-00122-of-000163.safetensors b/model-00122-of-000163.safetensors index e260c4d8ee8479b3451b4c000272bc331e0445d0..9a4061bce64ac71b94a371a7cb1ea53abe6154c4 100644 --- a/model-00122-of-000163.safetensors +++ b/model-00122-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c0f97f007f4a139c57af832306eb89a05be684c6f56dde1c8dee34e4dcc18a2b -size 1747416576 +oid sha256:d21ed70a9bd4a6811d07584459f28d46e1033e33c9f3d5d18b77610ae27b5bb6 +size 3493899088 diff --git a/model-00123-of-000163.safetensors b/model-00123-of-000163.safetensors index b324982c4bf7ed96c00e31c2640b958dd4e3d655..1d8d3a35666dcffedfc0aa1da1f6ad3e2387ca80 100644 --- a/model-00123-of-000163.safetensors +++ b/model-00123-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:519568466224076a0751d3bfe99f1e1c2e63b063df7042412777f74bb78fc6e5 -size 4302315568 +oid sha256:0abb8612dc42cc636750b017d67c6116f790a84230857902726ede5212a1a6a7 +size 8598757608 diff --git a/model-00124-of-000163.safetensors b/model-00124-of-000163.safetensors index 29a29a9668b9f4763ce3514ba3ac57f47f8501a4..2522cedf5e76b3ba01c58cb371f5c8c0cc82aa1e 100644 --- a/model-00124-of-000163.safetensors +++ b/model-00124-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:30cda78d30565747d735ba85dec5c44dcd8dc5432f26b4aed24a05ca87eee33e -size 4302382672 +oid sha256:1d860d98c956fd6ac2f95a01a3e4542d3e182551088b39ac37d46ee4e0937051 +size 8602554424 diff --git a/model-00125-of-000163.safetensors b/model-00125-of-000163.safetensors index e79ea2a8b2262a7d86cff20249dd2b2c91a1dd65..b2a9adef14233f058ccf94efd488ec9f76bec7fc 100644 --- a/model-00125-of-000163.safetensors +++ b/model-00125-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a4a0dd8ee862041575bd6747e29a31decc36ee61e06286ee9fde205009391bd1 -size 4302348568 +oid sha256:ef1ff711a31663db46cab3a33ae3451639a5f8b370d2f03a1a0ea0f367adb51f +size 8598786704 diff --git a/model-00126-of-000163.safetensors b/model-00126-of-000163.safetensors index 30352b9e3c1ee1e203df7e57bc3a2982e8e5341a..01d0e31731e6da64289c4bd465675ce4061b0a64 100644 --- a/model-00126-of-000163.safetensors +++ b/model-00126-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2123b22cd5f9deca6155053114f874e45d74033f66b0e98878d91abaec10526f -size 4302382280 +oid sha256:e7892f983d5be58c82e2a2621e73590847cabea624748a6c60f33e048040bcce +size 8602554224 diff --git a/model-00127-of-000163.safetensors b/model-00127-of-000163.safetensors index d7010ec1164a1ffd867eebf39dd4445e7cf2e055..aafd90064efae1e34f8edf5473304fda67ed1b48 100644 --- a/model-00127-of-000163.safetensors +++ b/model-00127-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df64488c1d23700c9de4a5f4dcc77d92347ff48cd5379583ec7173c462972520 -size 4302382720 +oid sha256:5abac35c5e1232546ee08478bf65018093927fbbc5de6be0b00b0d106aad48a5 +size 8602554448 diff --git a/model-00128-of-000163.safetensors b/model-00128-of-000163.safetensors index 26294f82ccdce21ff75e51bc107c3f6bfc79c789..9fc72d4e5a5dcd44c613c25d76110ca749734cf4 100644 --- a/model-00128-of-000163.safetensors +++ b/model-00128-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5372412e1020edabe1884ef7f772a3edde7a3c102530f09c3e43c86a12be8433 -size 4302348376 +oid sha256:0be9eed644d26e4c108fb4e8c9c848c060630efbb68d1a6823e93b37d2a8b6f5 +size 8598786608 diff --git a/model-00129-of-000163.safetensors b/model-00129-of-000163.safetensors index 61f354ca73617d7ab10a6a562cfa1e5738bf02b2..2cbe0b56440ec1b2ff78c7c375e56a7a5fd40298 100644 --- a/model-00129-of-000163.safetensors +++ b/model-00129-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f6a381cea2a757cb1ac454ccb21ea19debb83f2681738508d59478cb2bd10ca4 -size 4302382472 +oid sha256:2005d56911e11ec22222d439175840320793fd490baea742f6c1d0d7e769f894 +size 8602554320 diff --git a/model-00130-of-000163.safetensors b/model-00130-of-000163.safetensors index f300490a5386e940d685d5bc1f3a0e0248b6519a..53e541280d005d025f4c822ed9639a16faeca215 100644 --- a/model-00130-of-000163.safetensors +++ b/model-00130-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fa83d556fc8f63fb22bff1400c8c490f14b9085031104451f8ef456ef67a0711 -size 4302382720 +oid sha256:649d2d42c3253f704b37b4bb51ed2e785fe13c0845329cf67cc8e36f94ec44d3 +size 8602554448 diff --git a/model-00131-of-000163.safetensors b/model-00131-of-000163.safetensors index 1515ca0784dd36dcc872bd725079619f69fea5d6..df996c503a5c373f62454dfdcb8dc35e85965849 100644 --- a/model-00131-of-000163.safetensors +++ b/model-00131-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4a6476938cd6a1e8aadd044cb2883eb52d77ec58003e28b8d50e991fa64ed7a7 -size 4302348184 +oid sha256:de93f17a292f43af0b13070207a90dd769569aa3d29cade912a4390f5b42b1fa +size 8598786504 diff --git a/model-00132-of-000163.safetensors b/model-00132-of-000163.safetensors index 2cfaef19aa8b05234332aa43ade46c4da1882454..cad6a93cc9a33739438e48e0e56b10957d5db1e0 100644 --- a/model-00132-of-000163.safetensors +++ b/model-00132-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:db70f130f3242dd89ec63e69749e7f482a11c2e664e4eef6d934b0eb1347cd7c -size 4302382656 +oid sha256:67f44771bab5093ae5215a6651b0a01f83bb17106db262ab8de783c19903f7cc +size 8602554416 diff --git a/model-00133-of-000163.safetensors b/model-00133-of-000163.safetensors index b7a42de249dff81dd95f3da0da9ff90c99d3d145..59da440fd1a057829d2b1f75257b65ccbdec419c 100644 --- a/model-00133-of-000163.safetensors +++ b/model-00133-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8f488efd2ab0864520342e8da6696b711a2fc67440e5093c9cb6856b0e24a1f0 -size 4302348584 +oid sha256:b0c876d4bad0f23f5bd60734d456be64449ae737b7800e636b86682cb6013477 +size 8598786704 diff --git a/model-00134-of-000163.safetensors b/model-00134-of-000163.safetensors index 7bcd32c948cc48e41cf78c38b11bc672af783052..d83a940c3ff2e681a165e21982f1d1d92e5de3ce 100644 --- a/model-00134-of-000163.safetensors +++ b/model-00134-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b84de51ceef24cccdeb7e2090f88336ffa7b0846bd8ed0430185659d73617340 -size 4302382264 +oid sha256:de389ddcad2bbbf926628caa2b0fa4570a4d35b0dfd38638dbad756e08ceb25c +size 8602554224 diff --git a/model-00135-of-000163.safetensors b/model-00135-of-000163.safetensors index 068f8efb00907c82b16d8d032aa1b33411caff5b..296939a33ea235cbaeea75696795c88b1a27d9d7 100644 --- a/model-00135-of-000163.safetensors +++ b/model-00135-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:773db07c6a7b6669302ca6530224bf68247fa18e31d4117a7fd1f0c8d0de9963 -size 4302382720 +oid sha256:83045f32f8d06ac79dba3abe75afcdbb468cfb392764ad6f6d723247d453ad1e +size 8602554448 diff --git a/model-00136-of-000163.safetensors b/model-00136-of-000163.safetensors index 07e9a65605fab3878902ab18e40932415e874d30..2d824f6fae35001d9840c665adf27a3fe0163c43 100644 --- a/model-00136-of-000163.safetensors +++ b/model-00136-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0f072a261cb918526a8f79784b13292ce1850c3b4d6f074d557ff3098eae3868 -size 4302348392 +oid sha256:0498fe2c376b9b1b746e6c6e60df3db2677c75ea0161218c60eecedce2ecd069 +size 8598786616 diff --git a/model-00137-of-000163.safetensors b/model-00137-of-000163.safetensors index 1dc2c867158e165f85cd7c9ac5598a70d8b3c6ac..fe77f8c2b43b7d82516f4df1d824fe44a2fe652b 100644 --- a/model-00137-of-000163.safetensors +++ b/model-00137-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:093dda754c5b056acfd223460e1ef15077bba26a9b1a0ba3b924b44657cec54f -size 4302382448 +oid sha256:7180de2c7dfe8ac1db0012cbec1aeec96baeafda491ba2388c9ea5ae49e61da5 +size 8602554312 diff --git a/model-00138-of-000163.safetensors b/model-00138-of-000163.safetensors index c2ed469d266a5186eba083d3e63abc0852d7b0a5..8c6b46a8d21e11c361dddb42941c62186f0fe94f 100644 --- a/model-00138-of-000163.safetensors +++ b/model-00138-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:953f2e7288fb9e066405febc443bdd8569c98158e8d53c8e1052fa5a98dc85a4 -size 4302382720 +oid sha256:212640899a662a3d1fced8c6d41328af9774c81001e762afba5c72d009f1020f +size 8602554448 diff --git a/model-00139-of-000163.safetensors b/model-00139-of-000163.safetensors index 0e339c900afcf43429c9c326f2402aee09c64c92..969f3120c0d0f275348c36d644094d7202772f7f 100644 --- a/model-00139-of-000163.safetensors +++ b/model-00139-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2e31e57b430a8fad1b3667e2fac6aa8848ce3a93546a6847d2669e7803dce983 -size 4302348200 +oid sha256:0ee9b95c0e238b94d8f98c16fdf819aab5326db5a1b5f65b189877219a1b55de +size 8598786520 diff --git a/model-00140-of-000163.safetensors b/model-00140-of-000163.safetensors index f29310959daea0159ccbe1c551fb1c8e7fb62ebd..b34239264777a42788b2792b7a719badc9b67baf 100644 --- a/model-00140-of-000163.safetensors +++ b/model-00140-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d997785e4e236de3b974cc05ca8ce20df1058fed18673e07f85d8951ab45665e -size 4302382640 +oid sha256:226a05ff2be2323243129df09466966cb506836e554f4719d34189387cd009e9 +size 8602554408 diff --git a/model-00141-of-000163.safetensors b/model-00141-of-000163.safetensors index 7f6e528af30deed123e69136e63d685258f025b5..af55af19647ef5b95e841b81ae54cc35d01d20ca 100644 --- a/model-00141-of-000163.safetensors +++ b/model-00141-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:042bdc8970e9f676dde09ea749b866ed9177a91aa5ef1c4e4e903df790c04c83 -size 3142387136 +oid sha256:e1f66a518e1e19c72b38e00fab8cf8585f53fbef96ec4c34b55f93aac3fe7cea +size 6283123256 diff --git a/model-00142-of-000163.safetensors b/model-00142-of-000163.safetensors index 64b8c405cfa283cf44cf28e911f6a5561b186b49..7d4d1495151f0ddf072b131b950bedd2714d2aa1 100644 --- a/model-00142-of-000163.safetensors +++ b/model-00142-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d7e35992a6c4e6cfd6f130b17555b645d75cb407abe3e9bae275f5fc7e5de6d8 -size 4302315568 +oid sha256:d3fa961f2caf9289feeab0b3cbf280bcefa6efbc617b8e2929ffb59064cb454e +size 8598757608 diff --git a/model-00143-of-000163.safetensors b/model-00143-of-000163.safetensors index 01c9437a9196d12ef2d3f86899e29a2975e3143c..155dc6cf3fa7fa8a87fe28eff423068f553cc283 100644 --- a/model-00143-of-000163.safetensors +++ b/model-00143-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:10430ece1d6541fead15e9a993ccd0c533180b2c2bfe44f95f4c38b84fcbca53 -size 4302382672 +oid sha256:0da75549dd28840074d537c28d2285a125db9fb70f74bffc2713e3d57b4d4416 +size 8602554424 diff --git a/model-00144-of-000163.safetensors b/model-00144-of-000163.safetensors index 59bc0847cd3de35555da9c4bb75b6cdc16702cbf..44d9aeb55955781c4974e073e5af2eff8867d73e 100644 --- a/model-00144-of-000163.safetensors +++ b/model-00144-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9e1d10df8855972ca9c778f59a13389ffe22b617b80b443859aa232cd2bed0be -size 4302348568 +oid sha256:1f470510c127158f70b40d99fe9efe58f2d923c4e771feec052c345c68e5e98c +size 8598786704 diff --git a/model-00145-of-000163.safetensors b/model-00145-of-000163.safetensors index 013bf32dcfa26d2c044681cadf427e1b9eb1bba3..fedccd8af40c6b7126d517f413bdbf733d4a23be 100644 --- a/model-00145-of-000163.safetensors +++ b/model-00145-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b2ea4bac41b5a57f3691ea8f77750da21c26e8d1e067b0245739e132893082e3 -size 4302382280 +oid sha256:0e9efbe3faf16406ceb3dce9b31f6bf7cd152f5bf2bef372f88e7f60dd7892e6 +size 8602554224 diff --git a/model-00146-of-000163.safetensors b/model-00146-of-000163.safetensors index 45e3a3579a39048dddc277511c0618061600c4f6..76673391f1e2b14bbf34ca51cd4d03ad0ffc7a5b 100644 --- a/model-00146-of-000163.safetensors +++ b/model-00146-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:97a73fd6d8099d1ca26d7c8ec944f0350fd5eb74d1ee25a6dd47a1a18a2ca8de -size 4302382720 +oid sha256:60c50dde74a68ae0af0f27e60921086088e5315e8d036c9996e70b8966c1605f +size 8602554448 diff --git a/model-00147-of-000163.safetensors b/model-00147-of-000163.safetensors index 355aa1e715a4704fcf2fdcb5bd3be3d7e919c51d..8673cb93a7dd47bab1ad9ddbf501d5eb926be2a9 100644 --- a/model-00147-of-000163.safetensors +++ b/model-00147-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:45e5c0f0db53fbd63cda8b6c9a124485bf900212e7770377f1af03d8a92490f9 -size 4302348376 +oid sha256:a8753bf6a1f678300b69fe9f59a6c1e452cf1bbfe74b08a10eb5bcc5ecc33643 +size 8598786608 diff --git a/model-00148-of-000163.safetensors b/model-00148-of-000163.safetensors index be9589b90942d218f46aa281a0bd9a7af01b5fd1..616bded67b7d8e2f3bd6a7fc17d7c0d26e99c96d 100644 --- a/model-00148-of-000163.safetensors +++ b/model-00148-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b59ca257a4229e1d0ea1bc7a47ba6b0312d5fba632c214cf0b7bf3128169e6b8 -size 4302382472 +oid sha256:8f74f7457bb2d8bb8cfdaa6ed11fe7be128d146187c9f4cda016deee815b79fa +size 8602554320 diff --git a/model-00149-of-000163.safetensors b/model-00149-of-000163.safetensors index 1ea8be4ab1331989472709a42f991583e88865a7..34575128b46ed89d4e44bd84b7b64dfe32cfd946 100644 --- a/model-00149-of-000163.safetensors +++ b/model-00149-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3e210c5a0ac3148ffd88953ac3645ae2561a787349fd788ebba77445d406f11a -size 4302382720 +oid sha256:8726e40eaa3a9669cb51980857ebd5f03e6cff19b39fa76ca406abb3e2a28908 +size 8602554448 diff --git a/model-00150-of-000163.safetensors b/model-00150-of-000163.safetensors index efd3b6c4e46445bd617de3cc677bb67d057e5ec3..850638a0ac2c3b82158c3abf0212411794336fbb 100644 --- a/model-00150-of-000163.safetensors +++ b/model-00150-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:26d6502cd7b86c6e49bd734214596ccf900a473f0e5d1c363592b1c52ab08b9b -size 4302348184 +oid sha256:f7c47c83a01d65bde0f6a8ba569ce9d99f13f542893a9402f2613c737a89caca +size 8598786504 diff --git a/model-00151-of-000163.safetensors b/model-00151-of-000163.safetensors index 081117839036e9567fecf7f59aa68f876b9ab5ed..807fa215aa619e23a4c0b766fa12cc85ded7991e 100644 --- a/model-00151-of-000163.safetensors +++ b/model-00151-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:16f7d8cc5bbb3e0a28b0490fc096104998f1a1c55d0e8af3b4237460dd1dc6c1 -size 4302382656 +oid sha256:ec3e3f1dd53186ce6906726f34f1521fe2d9a8b4dc591ab68eefefb88680dda9 +size 8602554416 diff --git a/model-00152-of-000163.safetensors b/model-00152-of-000163.safetensors index 557d03254520ef1f7dcf7b03b14d9618eec0b753..ba103c5bad73756aa6d6ec8bdb3f18191e7beb76 100644 --- a/model-00152-of-000163.safetensors +++ b/model-00152-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d52e13133c694923d5a8f6c8258c5aed857afeba4062f70a0eaf06a0c970aab8 -size 4302348584 +oid sha256:36cb6721c8fe521ddb481a989214ad10ba4513a25fa7bf172aa1e2f3e0d2c733 +size 8598786704 diff --git a/model-00153-of-000163.safetensors b/model-00153-of-000163.safetensors index c6dcf272b47755fd271a4af0d1539d605f9e4611..d0d1ffd2d9aaa54abc4ff7319bc0696d39ab4743 100644 --- a/model-00153-of-000163.safetensors +++ b/model-00153-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c495ecfabf288abc81cea962b7676872f92e63c6b0260bc2f9cbc75418e00445 -size 4302382264 +oid sha256:7053d92c470ced5edc16d3480dee3429b65726e361499425b5a6c9edd6a95d7a +size 8602554224 diff --git a/model-00154-of-000163.safetensors b/model-00154-of-000163.safetensors index 91aa1a0bec11f1cdd65783d5676075a120bfdbd9..96f8c3965f30306453b0980c00730e5a800f6a26 100644 --- a/model-00154-of-000163.safetensors +++ b/model-00154-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5035c3fc7b727c6087ce3eee4de9a2979d821b7ccfbf61c793bb2ea13634f2dd -size 4302382720 +oid sha256:9487c21d2cfcea4fdc15e72797e222b5f762880311f7ca82215d21a9c38f5621 +size 8602554448 diff --git a/model-00155-of-000163.safetensors b/model-00155-of-000163.safetensors index 528069af79c412d78002cc142e0692d137de35a0..b768a3694e3ad2f41c3871ca838ae4a86312b551 100644 --- a/model-00155-of-000163.safetensors +++ b/model-00155-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ba6d0f7721fb778cd99bf79936fd18044d3badd960715b494b73bbcd47c83975 -size 4302348392 +oid sha256:ac9f236890df19d27c68ec275ef66e262120220f2c52d3fcf083f773a53724e6 +size 8598786616 diff --git a/model-00156-of-000163.safetensors b/model-00156-of-000163.safetensors index 47f929f85f598f573a5064357e17be2d6f54448a..4edeb33f9b9d44d904ef33b11d9960d7a9dc55f1 100644 --- a/model-00156-of-000163.safetensors +++ b/model-00156-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d7b340d7dfee6e91cc40a124255a95b459be3076d533812ce2bf2cb12a569871 -size 4302382448 +oid sha256:9c4ee5ab9972c55414fc4e8149562ecac6f06c403dd89034273ae2b9aa658b81 +size 8602554312 diff --git a/model-00157-of-000163.safetensors b/model-00157-of-000163.safetensors index 1d0276d5b92c363f6d0be0ae1da5ef1f0acd63b6..cda4f270331b04d7ff523b1e9969c51509c5713d 100644 --- a/model-00157-of-000163.safetensors +++ b/model-00157-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:30f304992839e80b1bd5037b8f76650a54794a0972a035e05ee5b681a992f80b -size 4302382720 +oid sha256:b8eea3c625b990e4d2da908c50f537b343b319eb5839e779e107a2f7ffaac7f1 +size 8602554448 diff --git a/model-00158-of-000163.safetensors b/model-00158-of-000163.safetensors index a6b3459a7e22f01ecf451936622b8a96cb664526..17c1a2ca8c6f67a4e663ae3ae8451b87f06ae7fd 100644 --- a/model-00158-of-000163.safetensors +++ b/model-00158-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6c4893dc2329dbbb9291ae3f2980c03379f3775ab17f5e1ae464c9b4ccf0c8f5 -size 4302348200 +oid sha256:25803a541f1a789d96f5da7d8e617da03852ad17c875f9c1a4293c020ea93365 +size 8598786520 diff --git a/model-00159-of-000163.safetensors b/model-00159-of-000163.safetensors index a6916f6eeb494ab93912e6d4669d4fe5359ffb55..ed5eaff6d6bd57d1e5699b8942c2ce80cdf11101 100644 --- a/model-00159-of-000163.safetensors +++ b/model-00159-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0e4709521cf5642ad7fc91a495f71e2f2150105f70430b160f8e8cf65ef903a3 -size 4302382640 +oid sha256:8d9a00b5032f673f042d91e146d6cd9918de0551f8f95119b2c6b9d49faff271 +size 8602554408 diff --git a/model-00160-of-000163.safetensors b/model-00160-of-000163.safetensors index d4702c426254b585a155b390e87c9a48a4aa6643..409f56d9492de5cd9a9387f558e5875a374dfa07 100644 --- a/model-00160-of-000163.safetensors +++ b/model-00160-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4bfe410b7ee190197e02d47771895133970839de3b2be98f79353276882781bc -size 5230635800 +oid sha256:b67ee73f915fc4e7a7764bf0651b93d068cee7f97efb9bfe508538def823cdbf +size 8602463472 diff --git a/model-00161-of-000163.safetensors b/model-00161-of-000163.safetensors index cce16c2f5ddb9b0121bf7fb11f096fd98b7c0db5..e221906bddaf648036aceda4ef487013bc11fa71 100644 --- a/model-00161-of-000163.safetensors +++ b/model-00161-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c8410fc54d2cca5a033964a922bc7f7aa954e7d549f5843606a4ab6ce1e57ccb -size 4302382080 +oid sha256:97503e5faf5cae02e4dd5e59be5038cf909729b8ebbc7cfe21c2467df86544c9 +size 8602554128 diff --git a/model-00162-of-000163.safetensors b/model-00162-of-000163.safetensors index a51ed619d61041addab033c266ba5e5bfdd5a8f3..f02f2501ee488f848dabe255856c928822cda1ca 100644 --- a/model-00162-of-000163.safetensors +++ b/model-00162-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:750fc70b1aa25f64b4f6300883ae14a3283159ce1f9f405e218624078bfe67ed -size 4302382704 +oid sha256:613785e87b259d97621fa002ac58b15b030ae114d54698809e5ab7e55529547f +size 8602554440 diff --git a/model-00163-of-000163.safetensors b/model-00163-of-000163.safetensors index 63ac4021e5a23c75a950910edc2962986b8446d5..23049c71f18fbb416e0227bdc4a7db5c4e1cf809 100644 --- a/model-00163-of-000163.safetensors +++ b/model-00163-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7aaa407921beb2b98efb0394298e388234f8f0faf831f04a1c138104ac4c4826 -size 6584783200 +oid sha256:cb8efe6f2148b98c3d94296912aa63a65ab8d9884d068668d92d3234c5427589 +size 9255875920 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..5b60276c1efb766f6a1aee2e357e27407f6ed12b --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,46188 @@ +{ + "metadata": {}, + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.gate.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.227.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.input_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_b_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_proj_with_mqa.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_b_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.gate.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.161.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.input_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_b_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_proj_with_mqa.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_b_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.mlp.gate.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.194.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.194.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.194.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.input_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_b_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_proj_with_mqa.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_b_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.gate.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.226.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.input_layernorm.weight": "model-00012-of-000163.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00012-of-000163.safetensors", + "model.layers.7.self_attn.q_a_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_a_layernorm.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_b_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_proj_with_mqa.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_layernorm.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_b_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.gate.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.190.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.input_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_b_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_proj_with_mqa.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_b_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.gate.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.input_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_b_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_proj_with_mqa.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_b_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.gate.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.253.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.253.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.253.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.input_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_b_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_proj_with_mqa.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_b_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.gate.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.187.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.187.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.187.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.input_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_b_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_proj_with_mqa.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_b_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.gate.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.219.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.input_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_b_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_proj_with_mqa.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_b_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.gate.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.input_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_b_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_proj_with_mqa.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_b_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.gate.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.input_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_b_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_proj_with_mqa.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_b_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.gate.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.216.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.216.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.216.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.input_layernorm.weight": "model-00034-of-000163.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00034-of-000163.safetensors", + "model.layers.15.self_attn.q_a_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_a_layernorm.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_b_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_proj_with_mqa.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_layernorm.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_b_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.gate.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.190.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.input_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_b_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_proj_with_mqa.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_b_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.gate.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.input_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_b_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_proj_with_mqa.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_b_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.gate.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.253.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.253.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.253.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.input_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_a_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_a_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_b_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_a_proj_with_mqa.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_a_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_b_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.gate.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.187.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.187.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.187.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.input_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_a_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_a_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_b_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_a_proj_with_mqa.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_a_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_b_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.gate.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.219.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.219.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.219.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.input_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_a_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_a_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_b_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_a_proj_with_mqa.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_a_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_b_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.gate.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.input_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_a_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_a_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_b_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_a_proj_with_mqa.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_a_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_b_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.gate.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.input_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_a_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_a_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_b_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_a_proj_with_mqa.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_a_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_b_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.gate.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.216.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.216.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.216.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.input_layernorm.weight": "model-00056-of-000163.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00056-of-000163.safetensors", + "model.layers.23.self_attn.q_a_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.q_a_layernorm.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.q_b_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_a_proj_with_mqa.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_a_layernorm.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_b_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.gate.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.190.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.190.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.190.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.input_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_a_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_a_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_b_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_a_proj_with_mqa.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_a_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_b_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.gate.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.input_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_a_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_a_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_b_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_a_proj_with_mqa.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_a_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_b_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.gate.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.253.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.253.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.253.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.input_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_a_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_a_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_b_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_a_proj_with_mqa.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_a_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_b_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.gate.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.187.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.187.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.187.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.input_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_a_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_a_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_b_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_a_proj_with_mqa.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_a_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_b_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.gate.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.219.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.219.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.219.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.input_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_a_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_a_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_b_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_a_proj_with_mqa.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_a_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_b_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.gate.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.input_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_a_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_a_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_b_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_a_proj_with_mqa.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_a_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_b_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.gate.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.input_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_a_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_a_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_b_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_a_proj_with_mqa.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_a_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_b_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.gate.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.216.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.216.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.216.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.input_layernorm.weight": "model-00078-of-000163.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00078-of-000163.safetensors", + "model.layers.31.self_attn.q_a_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.q_a_layernorm.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.q_b_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_a_proj_with_mqa.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_a_layernorm.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_b_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.gate.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.190.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.190.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.190.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.input_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_a_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_a_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_b_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_a_proj_with_mqa.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_a_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_b_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.gate.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.input_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_b_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_proj_with_mqa.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_b_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.gate.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.253.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.253.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.253.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.input_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_b_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_proj_with_mqa.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_b_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.gate.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.187.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.187.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.187.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.input_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_b_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_proj_with_mqa.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_b_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.gate.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.219.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.input_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_b_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_proj_with_mqa.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_b_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.gate.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.input_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_b_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_proj_with_mqa.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_b_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.gate.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.input_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_b_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_proj_with_mqa.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_b_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.gate.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.216.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.216.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.216.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.input_layernorm.weight": "model-00100-of-000163.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00100-of-000163.safetensors", + "model.layers.39.self_attn.q_a_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_a_layernorm.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_b_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_proj_with_mqa.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_layernorm.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_b_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.gate.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.190.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.input_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_b_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_proj_with_mqa.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_b_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.gate.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.input_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_b_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_proj_with_mqa.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_b_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.gate.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.253.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.253.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.253.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.input_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_b_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_proj_with_mqa.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_b_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.gate.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.187.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.187.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.187.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.input_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_b_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_proj_with_mqa.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_b_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.gate.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.219.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.input_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_b_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_proj_with_mqa.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_b_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.gate.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.input_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_b_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_proj_with_mqa.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_b_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.gate.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.input_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_b_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_proj_with_mqa.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_b_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.gate.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.216.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.216.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.216.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.input_layernorm.weight": "model-00122-of-000163.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00122-of-000163.safetensors", + "model.layers.47.self_attn.q_a_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_a_layernorm.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_b_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_proj_with_mqa.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_layernorm.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_b_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.gate.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.gate.e_score_correction_bias": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.190.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.input_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_b_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_proj_with_mqa.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_b_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.gate.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.gate.e_score_correction_bias": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.input_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_b_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_proj_with_mqa.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_b_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.gate.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.gate.e_score_correction_bias": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.253.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.253.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.253.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.input_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_b_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_proj_with_mqa.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_b_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.gate.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.gate.e_score_correction_bias": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.187.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.187.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.187.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.input_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_b_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_proj_with_mqa.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_b_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.gate.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.gate.e_score_correction_bias": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.219.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.input_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_b_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_proj_with_mqa.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_b_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.gate.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.gate.e_score_correction_bias": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.input_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_b_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_proj_with_mqa.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_b_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.gate.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.gate.e_score_correction_bias": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.input_layernorm.weight": "model-00141-of-000163.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00141-of-000163.safetensors", + "model.layers.54.self_attn.q_a_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_a_layernorm.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_b_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_proj_with_mqa.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_layernorm.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_b_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.gate.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.gate.e_score_correction_bias": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.190.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.input_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_b_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_proj_with_mqa.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_b_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.gate.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.gate.e_score_correction_bias": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.input_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_b_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_proj_with_mqa.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_b_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.gate.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.gate.e_score_correction_bias": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.253.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.253.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.253.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.input_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_b_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_proj_with_mqa.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_b_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.gate.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.gate.e_score_correction_bias": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.187.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.187.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.187.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.input_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_b_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_proj_with_mqa.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_b_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.gate.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.gate.e_score_correction_bias": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.219.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.input_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_b_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_proj_with_mqa.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_b_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.gate.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.gate.e_score_correction_bias": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.input_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_b_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_proj_with_mqa.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_b_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.gate.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.gate.e_score_correction_bias": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.input_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00160-of-000163.safetensors", + "model.norm.weight": "model-00160-of-000163.safetensors", + "lm_head.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_b_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_proj_with_mqa.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_b_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.o_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.gate.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.gate.e_score_correction_bias": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.195.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.195.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.195.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.input_layernorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.post_attention_layernorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.embed_tokens.weight": "model-00163-of-000163.safetensors", + "model.layers.61.enorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.hnorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.eh_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.shared_head.norm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.shared_head.head.weight": "model-00163-of-000163.safetensors" + } +} \ No newline at end of file